--- title: mahoudata keywords: fastai sidebar: home_sidebar summary: "API details." ---
df = pd.read_csv("./data/dataset-datathon.csv")
profile = ProfileReport(df, title='Pandas Profiling Report', html={'style':{'full_width':True}})
profile.to_notebook_iframe()
According to profile there are 60% duplicates. Get rid of them
df_clean = df.drop_duplicates(
#subset = df.columns.difference(['vajilla'])
)
profile = ProfileReport(df, title='Pandas Profiling Report', html={'style':{'full_width':True}})
profile.to_notebook_iframe()
context = {'numeric_cols' : ['lupulo_afrutado_citrico',
'lupulo_floral_herbal','amargor', 'color',
'maltoso', 'licoroso', 'afrutado', 'especias','acidez']
}
f = RecommenderStrategyFactory(context)
strategy = f.createStrategy('numeric')
datamodel = strategy.model_builder(df)
recommender_df = strategy.exec_strategy(datamodel)
recommender_df
recommendations_example = pd.DataFrame(recommender_df[1].sort_values(ascending=True))
recommendations_example